CUDA_VISIBLE_DEVICES=0 python -m vllm.entrypoints.openai.api_server --model /home/LB14787_linux/jinke/models/bge-m3-2G --served-model-name bge-m3 --port 10526  --max-model-len 8192 --dtype float32 --task embed --trust-remote-code
